 @conference{tsai,
  author={Yao-Hung Hubert Tsai, Shaojie Bai, Makoto Yamada, Louis-Philippe Morency, Ruslan Salakhutdinov},
  title={Transformer Dissection: An Uniﬁed Understanding for Transformer’s Attention via the  Lens  of Kernel},
  conference={Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP)},
  year=2019
}